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AATCAAACAA AACACCAATG AftAACACCAA TGAAAACACC AATGACAGTA GCTTCAC^S 

AATCAAACAA AACACCAATG AAAACACC ; . . AATGACAGTA GCTTCaS CTCcS^GA^ 

AATCAhACAA AGCGGCAAAG A ,f , . Z^~\T. ^TTCAfecS CTC^T^ 

AATCAAACAA AACACCAATG SSg^ «^AGTA 

A^CAfttcAt AACACCAATG S' _ ' ' ^^ACTA GCTTCACCTA CTCGCTGAAA 
A^C^A^A^ ^^^g" "^^ ^Z^A CTCGCTGAAA 

AATCAAACAA AAC r" " - • - -GCACAA ACTTCAGCTA CTCGCTGAAA 

AATCAAACA^CAATG AAAACACc! . ! ! .* 1 1 ! | ! 1 1. AAIGCCAGTA £SS££ 

nmvnnfflw^ ^ ~ — - ct tc accta ^cxc-cTCA ftfr 



HIS 
BZ10 
B2198 

P20 

H38 
22491 

H41 
EG329 
PMC21 
EG327 
Consensu? 



C2 

AAAGACCTCA 
AAAGACCTCA 
AAAGACCTCA 
AAAGAGCTGA 
AAAGACCTCA 
AAAGACCTCA 
AAAGACCTCA 
AAAGACCTCA 
AAAGACCTCA 
AAAGACCTCA 
AAAGfo-CT-A 



CAGATCTGAC 
CAGATCTGAC 
CAGATCTGAC 
AAGACCTGAC 
CAGATCTGAC 
CAGGCCTGAT 
CAGGCCTGAT 
CAGATCTGAC 
CAGATCTGAC 
CAGATCTGAC 
-AG- ~CTGA- 



V2 



CAGTGTTGAA 
CAGTGTTGAA 
CAGTGTTGAA 
CAGTGTTGAA 
CAGTGTTGAA 
CAATGTTGAA 
CAATGTTGAA 
CAGTGTTGGA 
CAGTGTTGGA 
CAGTGTTGGA 
CA-TGTTG-A 



ACTGAAAAAT 
ACTGAAAAAT 
ACTGAAAAAX 
ACTGAAAAAT 
ACTGAAAAAT 
ACTGAAAAAT 
ACTGAAAAAT 
ACTGAAAAAT 
ACTGAAAAAT 
ACTGAAAAAT 
ACTGAAAAAT 



C3 



TATCGTTTGG 
TATCGTTTGG 
TATCGTTTGG 
TATCGTTTGG 
TATCGTTTGG 
TATCGTTTGG 
TATCGTTTGG 
TATCGTTTAG 
TATCGTTTAG 
TATCGTTTAG 
TATCGTTT-G 



CGCAAACGGT 
CGCAAACGGT 
CGCAAACGGT 
CGCAAACGGT 
CGCAAACGGC 
CGCAAACGGC 
CGCAAACGGC 
CGCAAACGGC 
CGCAAACGGC 
CGCAAACAGC 
CGCAAftC-G- 



C3 

490 

AATAAAGTCA 
AATAAAGTCA 
AATAAAGTCA 
AATAAAGTCA 
AATAAAGTCA 
AAGAAAGTCA 
AAGAAAGTCA 
AATAAAGTCA 
AATAAAGTCA 
AATAAAGTCA 
AAGAAAGTCA 



H15 
BZ10 
B2198 

P20 

H38 
Z2491 

H41 
EG329 
PMC21 
EG327 
consensus 



HIS 
BZ10 

BZ198 
P20 
H38 

Z2491 

EG329 
PMC21 
EG327 
consensus 



491 

ACATCACAAG 
ACATCACAAG 
ACATCACAAG 
ACATCACAAG 
ACATCACAAG 
ACATCATAAG 
ACATCATAAG 
ACATCACAAG 
ACATCACAAG 
ACATCACAAG 
ACATC A— AAGj 



CGACACCAAA 
CGACACCAAA 
CGACACCAAA 
CGACACCAAA 
CGACACCAAA 
CGACACCAAA 
CGACACCAAA 
CGACACCAAA 
CGACACCAAA 
CGACACCAAA 
CGACACCAAA 



GGCTTGAATT 
GGCTTGAATT 
GGCTTGAATT 
GGCTTGAATT 
GGCTTGAATT 
GGCTTGAATT 
GGCTTGAATT 
GGCTTGAATT 
GGCTTGAATT 
GGCTTGAATT 
GGCTTGAATT 



TTGCGAAAGA 
TTGCGAAAGA 
TTGCGAAAGA 
TTGCGAAAGA 
TCGCGAAAGA 
TCGCGAAAGA 
TCGCGAAAGA 
TTGCGAAAGA 
TTGCGAAAGA 
TCGCGAAAAA 
T-GCGAAA-A 



561 

TCATCTGAAC 
TCATCTGAAC 
TCATCTGAAC 
TCATCTGAAC 
TCATCTGAAC 
TCATCTGAAC 
TCATCTGAAC 
TCATCTGAAC 
TCATCTGAAC 
TCATCTGAAC 
TCATCTGAAC 



GGTATCGGTT 
GGTATCGGTT 
GGTATCGGTT 
GGTATCGGTT 
GGTATTGGTT 
GGTATCGGTT 
GGTATCGGTT 
GGTATTGGTT 
GGTATTGGTT 
GGTATCGGTT 
CCTAT-r^TT 



C3 



CGACTTTGAC 
CGACTTTGAC 
CGACTTTGAC 
CGACTTTGAC 
CGACTTTGAC 
CGACTTTGAC 
CGACTTTGAC 
CGACTTTGAC 
CGACTTTGAC 
CGACTTTGAC 
CGACTTTGAC 



C3 



CGATACGCTG 
CGATACGCTG 
CGATACGCTG 
CGATACGCTT 
CGATACGCTG 
CGATACGCTT 
CGATATGCTG 
CGATACGCTG 
CGATACGCTG 
CGATACGCTG 
CGAXA-GCT- 



AACGGCTGGG 
AACGGCTGGG 
AACGGCTGGG 
AACGGCTGGG 
AACGGCTGGG 
AACGGCTGGG 
AACGGCTGGG 
AACGGCTGGG 
AACGGCTGGG 
AACGGCTGAG 

AACGGCTG-tt 



ACGAACGGCG 
ACGAACGGCG 
ACGAACGGCG 
ACGAACGGCG 
ACGAACGGCG 
ACGAACGGCG 
ACGAACGGCG 
ACGAACGGCG 
ACGAACGGCG 
ACGAACGGCG 
AC-AACGGCG 



560 

ACCCCACGGT 
ACCCCACGGT 
ACCCCACGGT 
ACCCCACGGT 
ACACCACGGT 
ACACCACGGT 
ACACCACGGT 
ACACCACGGT 
ACACCACGGT 
ACACCACGGT 
AC-CCACGGT 



CTGAATACCG 
CTGAATACCG 
CTGAATACCG 
GCGGGTTCTT 
CTGAATACCG 
GCGGGTTCTT 
CTGAATACCG 
CTGAATACCG 
CTGAATACCG 
CTGAATACCG 



GAGCGACCAC 
GAGCGACCAC 
GAGCGACCAC 
CTGCTTCTCA 
GAGCGACCAC 
CTGCTTCTCA 
GAGCGACCAC 
GAGCGACCAC 
GAGCGACCAC 
GAGCGACCAC 



630 

AAACGTAACC 
-AAACGTAACC 
AAACGTAACC 
CGTTGATGCG 
AAACGTAACC 
CGTTGATGCG 
AAACGTAACC 
AAACGTAACC 
AAACGTAACC 
AAACGTAACC 
— G C~ 



V3 



FIG. 2cont 



HIS 
BZ10 
BZ198 

P20 

H38 
Z2491 

H41 
EG329 
PMC21 
EG327 
Consensus 



CGACAAC^^ 



€31 

aacgacaac^Raccgatga 

AACGACAACG TTACCGATGA 
AACGACAACG TTACCGATGA 
GGTAACCAAA GTACACATTA 
AACGACAACG TTACCGATGA 
GGTAACCAAA GTACACATTA 
AACGACAACG TTACCGATGA 
AACGACAACG TTACCGATGA 
AACGACAACG TTACCGATGA 
AACGACAACG TTACCGATGA 
~ AC -A TAG — AT- A 



V3 

701 

HIS ACATTAAAGG CGTTAAACCC 
BZ10 ACATTAAAGG CGTTAAACCC 
BZ198 ACATTAAAGG CGTTAAACCC 
P20 ATATTAAGGG TGTTAAAACT 
H38 ACATTAAAGG CGTTAAACCC 
22 491 ATATTAAGGG TGTTAAAACT 
H41 ACATTAAAGG CGTTAAACCC 
EG329 ACATTAAAGG CGTTAAACCC 
PMC21 ACATTAAAGG CGTTAAACCC 
EG327 ACATTAAAGG CGTTAAACCC 
Consensus AzAttaa-gg -gttaaa-C- 
C4 



CGAGAAAAAA 
CGAGAAAAAA 
CGAGAAAAAA 

C ACT 

CAAGAAAAAA 

C ACT 

CGAGAAAAAA 
CGAGAAAAAA 
CGAGAAAAAA 
CGAGAAAAAA 
C~- A-- 



CGTGCGGCAA 
CGTGCGGCAA 
CGTGCGGCAA 
CGTGCAGCAA 
CGTGCGGCAA 
CGTGCAGCAA 
CGTGCGGCAA 
CGTGCGGCAA 
CGTGCGGCAA 
CGTGCGGCAA 
CGTGC-GCAA 



GCGTTAAAGA 
GCGTTAAAGA 
GCGTTAAAGA 
GTATTAAGGA 
GCGTTAAAGA 
GTATTAAGGA 
GCGTTAAAGA 
GCGTTAAAGA 
GCGTTAAAGA 
GCGTTAAAGA 
G^-TTAA-GA 



CGTATTAAAC 
CGTATTAAAC 
CGTATTAAAC 
TGTGTTGAAT 
CGTATTAAAC 
TGTGTTGAAT 
CGTATTAAAC 
CGTATTAAAC 
CGTATTAAAC 
CGTATTAAAC 
-GT-TT-AA- 



C4 



700 

GCAGGCTGGA 
GCAGGCTGGA 
GCAGGCTGGA 
GCGGGTTGGA 
GCAGGCTGGA 

gcgggttgga 
gcaggctgga 
gctggctgga 
gctggctgga 

GCAGGCTGGA 
GC— GG— Tcna 



GGTACAACAG CT TC CGATAACGTT 

GGTACAACAG CT TC CGATAACGTC 

GGTACAACAG CT TC CGATAACGTT 

GGCTCAACAA CTGGTCAATC AGAAAATGTC 

GGTACAACAG CT TC CGATAACGTT 

GGCTCAACAA CTGGTCAATC AGAAAATGTC 

GGTACAACAG CT TC CGATAACGTT 

GGTACAACAG CT TC CGATAACGTT 

GGTACAACAG CT TC CGATAACGTT 

GGTACAACAG CT TC CGATAACGTT 

GG— CAACA - CT TC -GA-AA-GT- 

V4 



GATTTCGTCC 
GATTTCGTCC 
GATTTCGTCC 
GATTTCGTCC 
GATTTCGTCC 
GATTTCGTCC 
GATTTCGTCC 
GATTTCGTCC 
GATTTCGTCC 
GATTTCGTCC 
GATTTCG TCC 



C5 



770 

GCACTTACGA 
GCACTTACGA 
GCACTTACGA 
GCACTTACGA 
ACACTTACGA 
GCACTTACGA 
GCACTTACGA 
GCACTTACGA 
GCACTTACGA 
GCACTTACGA 
-GACTTACGA 



HIS 
BZ10 
BZ198 

P20 

H38 
Z2491 

H41 
EG329 
PMC21 
EG327 
Consensus 



771 

CACAGTCGAG 
CACAGXCGAG 
CACAGTCGAG 
CACAGTCGAG 
CACAGTCGAG 
CACAGTCGAG 
CACAGTCGAG 
CACAGTCGAG 
CACAGTCGAG 
CACAGTCGAG 
CACAGTCGAG 



TTCTTGAGCG 
TTCTTGAGCG 
TTCTTGAGCG 
TTCTTGAGCG 
TTCTTGAGCG 
TTCTTGAGCG 
TTCTTGAGCG 
TTCTTGAGCG 
TTCTTGAGCG 
TTCTTGAGCG 
TTCTTGAGCjS, 



CAGATACGAA 
CAGATACGAA 
CAGATACGAA 
CAGATACGAA 
CAGATACGAA 
CAGATACGAA 
CAGATACGAA 
CAGATACGAA 
CAGATACGAA 
CAGATACGAA 
CAGATACGAA 



AACAACGACT 
AACAACGACT 
AACAACGACT 
AACAACGACT 
AACAACGACT 
AACAACGACT 
AACAACGACT 
AACAACGACT 
AACAACGACT 
AACAACGACT 
AACAACGACT 



HIS 
BZ10 
BZ198 

P20 

H36 
Z2491 

H41 
EG329 
PMC21 
EG327 
Consensus 



841 

AAAACCGAAG 
AGAACCGAAG 
AAAACCGAAG 
AGAACCGAAG 
AGAACCGAAG 
AGAACCGAAG 
AAAACCGAAG 
AAAACCGAAG 
AAAACCGAAG 
AGAACCGAAG 
A-AAC C GAAG 



TTAAAATCGG 
TTAAAATCGG 
TTAAAATCGG 
TTAAAATCGG 
TTAAAATCGG 
TTAAAATCGG 
TTAAAATCGG 
TTAAAATCGG 
TTAAAATCGG 
TTAAAATCGG 
TTAAAATCGG 



TGCGAAGACT 
TGCGAAGACT 
TGCGAAGACT 
TGCGAAGACT 
TGCGAAGACT 
TGCGAAGACT 
TGCGAAGACT 
TGCGAAGACT 
TGCGAAGACT 
TGCGAAGACT 
TGCGAAGACT^ 



C5 



TCTGTTATTA 
rCTGTTATTA 
TCTGTTATTA 
TCTGTTATTA 
TCTGTTATTA 
TCTGTTATTA 
TCTGTTATTA 
TCTGTTATTA 
TCTGTTATTA 

tctgttatca 
tctctta t-a 



GTTAATGTGG 
GTTAATGTGG 
GTTAATGTGG 
GTTAATGTGG 
GTTAATGTGG 
GTTAATGTGG 
GTTAATGTGG 
GTTAATGTGG 
GTTAATGTGG 
GTTAATGTGG 
G^AAT GTGG 



AAAGCAAAGA 
AAAGCAAAGA 
AAAGCAAAGA 
AAAGCAAAGA 
AAAGCAAAGA 
AAAGCAAAGA 
AAAGCAAAGA 
AAAGCAAAGA 
AAAGCAAAGA 
AAAGCAAAGA 
AAAGCAAAG^ 



840 

CAACGGCAAG 
CAACGGCAAG 
CAACGGCAAG 
CAACGGCAAG 
CAACGGCAAG 
CAACGGCAAG 
CAACGGCAAG 
CAACGGCAAG 
CAACGGCAAG 
CAACGGCAAG 
CAACGGCAAG 



C5 



AAGAAAAAGA 
AAGAAAAAGA 
AAGAAAAAGA 
AAGAAAAAGA 
AAGAAAAAGA 
AAGAAAAAGA 
AAGAAAAAGA 
AAGAAAAAGA 
AAGAAAAAGA 
AAGAAAAAGA 
AAGAAAAAGA 



CGGTAAGTTG 
CGGTAAGTTG 
CGGTAAGTTG 
CGGTAAGTTG 
CGGTAAGTTG 
CGGTAAGTTG 
CGGTAAGTTG 
CGGTAAGTTG 
CGGTAAGTTG 
CGGTAAGTTG 
.CGGTAAGTTG 



910 

GTTACTGGTA 
GTTACTGGTA 
GTTACTGGTA 
GTTACTGGTA 
GTTACTGGTA 
GTTACTGGTA 
GTTACTGGTA 
GTTACTGGTA 
GTTACTGGTA 
GTTACTGGTA 
GTTACTGGTA 



HIS 
BZ10 
BZ198 

WZ0 

H3B 
22491 

H41 
EG329 
PMC2 1 
EG327 
Consensus 



911 

AAGGCAAAGA 
AAGGCAAAGG 
AAGGCAAAGA 
AAGGCAAAGG 
AAGGCAAAGG 
AAGGCAAAGG 
AAGGCAAAGG 
AAGACAAAGG 
AAGACAAAGG 
AAGACAAAGG 



CGAGAATGGT 
CGAGAATGGT 
CGAGAATGGT 
CGAGAATGGT 
CGAGAATGGT 
CGAGAATGGT 
CGAGAATGGT 
CGAGAATGGT 
CGAGAATGGT 
CGAGAATGAT 
CGAGAATG-T 



TCTTCTACAG 
TCTTCTACAG 
TCTTCTACAG 
TCTTCTACAG 
TCTTCTACAG 
TCTTCTACAG 
TCTTCTACAG 
TCTTCTACAG 
TCTTCTACAG 
TCTTCTACAG 
TCTTCTACAG, 



ACGAAGGCGA 
ACGAAGGCGA 
ACGAAGGCGA 
ACGAAGGCGA 
ACGAAGGCGA 
ACGAAGGCGA 
ACGAAGGCGA 
ACGAAGGCGA 
ACGAAGGCGA 
ACAAAGGCGA 
AC-AAGGCCA 



C5 



aggcttagtg 
aggc'ttagtg 
aggcttagtg 
aggcttagtg 

AGGCTTAGTG 
AGGCTTAGTG 
AGGCTTAGTG 
AGGCTTAGTG 
AGGCTTAGTG 
AGGCTTAGTG 
AGGC , TTAgTO 



ACTGCAAAAG 
ACTGCAAAAG 
ACTGCAAAAG 
ACTGCAAAAG 
ACTGCAAAAG 
ACTGCAAAAG 
ACTGCAAAAG 
ACTGCAAAAG 
ACTGCAAAAG 
ACTGCAAAAG 
ACTGCAAAAg 



980 

AAGTGATTGA 
AAGTGATTGA 
AAGTGATTGA 
AAGTGATTGA 
AAGTGATTGA 
AAGTGATTGA 
AAGTGATTGA 
AAGTGATTGA 
AAGTGATTGA 
AAGTGATTGA 
AAGTGATTGA 



FIG. 2cont. 



HIS 
8210 
BZ198 

P20 

H38 
Z2491 

H41 
EG329 
PMC21 
BG327 
Consensus 



991 

tgcagtaaac 
tgcagtaaac 
tgcagtaaac 
tgcagtaaac 
tgcagtaaag 

TGCAGTAAAC 
TGCAGTAAAC 
TGCAGTAAAC 
TGCAGTAAAC 
TGCAGTAAAC 
TGCAGTAAAC 



AAGGCTGGTT 
AAGGCTGGTT 
AAGGCTGGTT 
AAGGCTGGTT 
AAGGCTGGTT 
AAGGCTGGTT 
AAGGCTGGTT 
AAGGCTGGTT 
AAGGCTGGTT 
AAGGCTGGTT 
AAGGCTGGTT 



GGAGAATGAA AACAACAACC 
GGAGAATGAA AACAACAACC 
GGAGAATGAA AACAACAACC 
GGAGAATGAA AACAACAACC 
GGAGAATGAA AACAACAACC 
GGAGAATGAA AACAACAACC 
GGAGAATGAA AACAACAACC 
GGAGAATGAA AACAACAACC 
GGAGAATGAA AACAACAACC 
GGAGAATGAA AACAACAACC 
GGAGAATGAA AACAACAArr 

'7> C5 



GCTAATGGTC 
GCTAATGGTC 
GCTAATGGTC 
GCTAATGGTC 
GCTAATGGTC 
GCTAATGGTC 
GCTAATGGTC 
GCTAATGGTC 
GCTAATGGTC 
GCTAATGGTC 
GCTAAT GG-rr 



AAACAGGTCA 
AAACAGGTCA 
AAACAGGTCA 
AAACAGGTCA 
AAACAGGTCA 
AAACAGGTCA 
AAACAGGTCA 
AAACAGGTCA 
AAACAGGTCA 
AAACAGGTCA 
AAACAGGTCA, 



1050 
AGCTGACAAG 
AGCTGACAAG 
AGCTGACAAG 
AGCTGA^AG 
AGCTGACAAG 
AGCTGACAAG 
AGCTGACAAG 
AGCTGACAAG 
AGCTGACAAG 
AGCTGACAAG 
AgCTGACAAff 



1051 
HIS TTTGAAACCG 
B21;g TTTGAAACCG 
BS198 TTTGAAACCG 
F20 TTTGAAACCG 
H38 TTTGAAACCG 
22491 TTTGAAACCG 
H4 1 TTTGAAACCG 
EG329 TTTGAAACCG 
PWCZ 1 ; TTTGAAACCG 
BG327 "TTTGAAACCG 
Consensus TTTGAAACCG 



TTAGAlfCAGG CACAAAAGTA 
TTACATCAGG. ^CACAAAAGTA 
TTACATCAGG^GAAATGTA 
TTACATCAGG .CACAAAAGTA 
^TTACATCAGG CACAAATGTA 
OTAGATCAGG CACAAATGTA 
.^TA^ATCAGG CACAAAAGTA 
TTACATCAGG CACAAATGTA 
TTACATCAGG CACAAATGTA 
TTACATCAGG CACAAATGTA 
TTACATCAGG CACAAA-CTA 



AGCTTTGCTA GTGGTAATGG 
ACCTTTGCTA GTGGTAATGG 
ACCTTTGCTA GTGGTAAAGG 
ACCTTTGCTA GTGGTAATGG 
ACCTTTGCTA GTGGTAAAGG 
ACCTTTGCTA GTGGTAAAGG' 
ACCTTTGCTA GTGGTAATGG 
ACCTTTGCTA GTGGTAAAGG 
, ACCTTTGCTA GTGGTAAAGG 
ACCTTTGCTA GTGGTAAAGG 
ACCTTTGCTA GTGGTAA-^ 



C5 



TACAACTGCG 
TACAACTGCG 
TACAACTGCG 
TACAACTGCG 
TACAACTGCG 
TACAACTGCG 
TACAACTGCG 
TACAACTGCG 
TACAACTGCG 
TACAACTGCG 
TACAACTGCG 



1120 
ACTGTAAGTA 
ACTGTAAGTA 
ACTGTAAGTA 
ACTGTAAGTA 
ACTGTAAGTA 
ACTGTAAGTA 
ACTGTAAGTA 
ACTGTAAGTA 
ACTGTAAGTA 
ACTGTAAGTA 
ACTGTAAGTA 



HIS 
BZ10 
BZ198 

P20 

H38 
Z2491 

H41 
EG329 
PMC21 
BG327 
Consensus 



1121 

AAGATGATCA 
AAGATGATCA 
AAGATGATCA 
AAGATGATCA 
AAGATGATCA 
AAGATGATCA 
AAGATGATCA 
AAGATGATCA 
AAGATGATCA 
AAGATGATCA 
AAGATGATCA 



AGGCAACATC ACTGTTAAGT 
AGGCAACATC ACTGTTAAGT 
AGGCAACATC ACTGTTAAGT 
AGGCAACATC ACTGTTAAGT 
AGGCAACATC ACTGTTAAGT 
AGGCAACATC ACTGTTATGT 
AGGCAACATC ACTGTTAAGT 
AGGCAACATC ACTGTTATGT 
AGGCAACATC ACTGTTATGT 
AGGCAACATC ACTGTTATGT 
AGGCAACATC _ ACTGTTA-GT 



ATGATGTAAA TGTCGGCGAT 
ATGATGTAAA TGTCGGCGAT 
ATGATGTAAA TGTCGGCGAT 
ATGATGTAAA TGTCGGCGAT 
ATGATGTAAA TGTCGGCGAT 
ATGATGTAAA -TGTCGGCGAT 
ATGATGTAAA TGTCGGCGAT 
ATGATGTAAA TGTCGGCGAT 
ATGATGTAAA TGTCGGCGAT 
ATGATGTAAA TGTCGGCGAT 
ATGATGTA AAjGTCGGCGAT 

C5 



GCCCTAAACG 
GCCCTAAACG 
GCCCTAAACG 
GCCCTAAACG 
GCCCTAAACG 
GCCCTAAACG 
GCCCTAAACG 
GCCCTAAACG 
GCCCTAAACG 
GCCCTAAACG 
GCCCTAAACG 



1190 
TCAATCAGCT 
TCAATCAGCT 
TCAATCAGCT 
TCAATCAGCT 
TCAATCAGCT 
TCAATCAGCT 
TCAATCAGCT 
TCAATCAGCT 
TCAATCAGCT 
TCAATCAGCT 

TCAATCAGCT 



HIS 
BZ10 
BZ198 

P20 

H38 
Z2491 

H41 
EG329 
PMC21 
EG327 
Consensus 



HIS 
BZIQ 
BZ196 

P20 

U38 
Z2491 

H41 
EG329 
PMC21 
EG327 
Consensus 



1191 

GCAAAACAGC 
GCAAAACAGC 
GCAAAACAGC 
GCAAAACAGC 
GCAAAACAGC 
GCAAAACAGC 
GCAAAACAGC 
GCAAAACAGC 
GCAAAACAGC 
GCAAAACAGC 
GCAAAACAGC 



GGTTGGAATT 
GGTTGGAATT 
GGTTGGAATT 
GGTTGGAATT 
GGTTGGAATT 
GGTTGGAATT 
GGTTGGAATT 
GGTTGGAATT 
GGTTGGAATT 
GGTTGGAATT 
GGTTGGAATT ^ 



TGGATTCCAA AGCGGTTGCA 
TGGATTCCAA AGCGGTTGCA 
TGGATTCCAA AGCGGTTGCA 
TGGATTCCAA AGCGGTTGCA 
TGGATTCCAA AGCGGTTGCA 
TGGATTCCAA AGCGGTTGCA 
TGGATTCCAA AGCGGTTGCA 
TGGATTCCAA AGCGGTTGCA 
TGGATTCCAA AGCGGTTGCA 
TGGATTCCAA AGCGGTTGCA 
JfiSATTCCAA, . AGCGGTTG CA, 

C5 



GGTTCTTCGG 
GGTTCTTCGG 
GGTTCTTCGG 
GGTTCTTCGG 
GGTTCTTCGG 
GGTTCTTCGG 
GGTTCTTCGG 
GGTTCTTCGG 
GGTTCTTCGG 
GGTTCTTCGG 
GGTTCTTCGG 



GCAAAGTCAT 
GCAAAGTCAT 
GCAAAGTCAT 
GCAAAGTCAT 
GCAAAGTCAT 
GCAAAGTCAT 
GCAAAGTCAT 
GCAAAGTCAT 
GCAAAGTCAT 
GCAAAGTCAT 
GCAAAGTCAT 



1260 
CAGCGGCAAT 
CAGCGGCAAT 
CAGCGGCAAT 
CAGCGGCAAT 
CAGCGGCAAT 
CAGCGGCAAT 
CAGCGGCAAT 
CAGCGGCAAT 
CAGCGGCAAT 
CAGCGGCAAT 
CAGCGGCAAT 



1261 

GTTTCGCCGA 
GTTTCGCCGA 
GTTTCGCCGA 
GTTTCGCCGA 
GTTTCGCCGA 
GTTTCGCCGA 
GTTTCGCCGA 
GTTTCGCCGA 
GTTTCGCCGA 
GTTTCGCCGA 
GTTTCGCCGA 



GCAAGGGAAA 
GCAAGGGAAA 
GCAAGGGAAA 
GCAAGGGAAA 
GCAAGGGAAA 
GCAAGGGAAA 
GCAAGGGAAA 
GCAAGGGAAA 
GCAAGGGAAA 
GCAAGGGAAA 
GCAAGGGAAA 



GATGGATGAA 
GATGGATGAA 
GATGGATGAA 
GATGGATGAA 
GATGGATGAA 
GATGGATGAA 
GATGGATGAA 
GATGGATGAA 
GATGGATGAA 
GATGGATGAA 
GATGGATGAA 



ACCGTCAACA 
ACCGTCAACA 
ACCGTCAACA 
ACCGTCAACA 
ACCGTCAACA 
ACCGTCAACA 
ACCGTCAACA 
ACCGTCAACA 
ACCGTCAACA 
ACCGTCAACA 
ACCGTCAACA 



C5 



TTAATGCCGG 
TTAATGCCGG 
TTAATGCCGG 
TTAATGCCGG 
TTAATGCCGG 
TTAATGCCGG 
TTAATGCCGG 
TTAATGCCGG 
TTAATGCCGG 
TTAATGCCGG 
TTAATGCrf^n 



CAACAACATC 
CAACAACATC 
CAACAACATC 
CAACAACATC 
CAACAACATC 
CAACAACATC 
CAACAACATC 
CAACAACATC 
CAACAACATC 
CAACAACATC 
CAACAACATC 



1330 
GAGATTACCC 
GAGATTACCC 
GAGATTACCC 
GAGATTACCC 
GAGATTACCC 
GAGATTAGCC 
GAGATTACCC 
GAGATTACCC 
GAGATTACCC 
GAGATTACCC 
JGAGATTA-CC 



FIG. 2cont. 



H15 
B210 
BZ198 

P20 

H38 
Z2491 

H41 
EG329 
PMC21 
EG327 
Consensus 



1331 

GCAACGGCAA 
GCAACGGCAA 
GCAACGGTAA 
GCAACGGCAA 
GCAACGGTAA 
GCAACGGTAA 
GCAACGGCAA 
GCAACGGTAA 
GCAACGGTAA 
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GCAGCAAGGA TGCCAACAAA 
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CCAGCAAG-A — CAArA fl* 
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1 MNKIYRIIWN SALNAWWVS ELTRNHTKRA SATVKTAVLA TLLFATVQAS 

51 ANNETDLTSV GTEKLSFSAN GNKVNITSDT KGLNFAKETA GTNGDTTVHX, 

101 NGIGSTLTDT LLNTGATTNV TNDNVTDDEK KRAASVKDVL NAGWNIKGVK 

151 PGTTASDNVD FVRTYDTVEF LSADTKTTTV NVESKDNGKK TEVKIGAKTS 

201 VI KEKDGKLV TGKDKGENGS STDEGEGLVT AKEVIDAVNK AGWFtMKTTTA 

2S1 NGQTGQADKF ETVTSGTNVT FASGKGTTAT VSKDDQGNIT VMYDVNVGDA 

301 LNVNQLQNSG WNLDSKAVAG SSGKVISGNV SPSKGKMDET VNINAGNNIE 

351 ITRNGKNIDI ATSMTPQFSS VSLGAGADAP TLSVDGDALN VGSKKDNKPV 

401 RITNVAPGVK EGDVTNVAQL KGVAQNLNNR IDNVDGNARA GIAQAIATAG 

451 LVQAYLPGKS MMAIGGGTYR GEAGYAIGYS SISDGGNWII KGTASGNSRG 

501 HFGASASVGY QW* 



1 ATGAACAAAA TATACCGCAT CATTTGGAAT AGTGCCCTCA ATGCATGGGT 

j«3 51 CGTCGTATCC GAGCTCACAC GCAACCACAC CAAACGCGCC TCCGCAACCG 

101 TGAAGACCGC CGTATTGGCG ACTCTGTTGT TTGCAACGGT TCAGGCAAGT 

• 151 GCTAACAATG AAACAGATCT GACCAGTGTT GGAACTGAAA AATTATCGTT 

201 TAGCGCAAAC GGCAATAAAG TCAACATCAC AAGCGACACC AAAGGCTTGA 

' J 251 ATTTTGCGAA AGAAACGGCT GGGACGAACG GCGACACCAC GGTTCATCTG 

iU 301 AACGGTATTG GTTCGACTTT GACCGATACG CTGCTGAATA CCGGAGCGAC 

351 CACAAACGTA ACCAACGACA ACGTTACCGA TGACGAGAAA AAACGTGCGG 

401 CAAGCGTTAA AGACGTATTA AACGCTGGCT GGAACATTAA AGGCGTTAAA 

J;H ' 451 CCCGGTACAA CAGCTTCCGA TAACGTTGAT TTCGTCCGCA CTTACGACAC 

Sy 501 AGTCGAGTTC TTGAGCGCAG ATACGAAAAC AACGACT GT T AATGTG GAAA 

si 551 GCAAAGACAA CGGCAAGAAA ACCGAAGTTA AAATCGGTGC GAAGACTTCT 

|;3 601 GTTATTAAAG AAAAAGACGG TAAGTTGGTT ACTGGTAAAG ACAAAGGCGA 

1*2 651 GAATGGTTCT TCTACAGACG AAGGCGAAGG CTTAGTGACT GCAAAAGAAG 

701 TGATTGATGC AGTAAACAAG GCTGGTTGGA GAATGAAAAC AACAACCGCT 

IU 751 AATGGTCAAA CAGGTCAAGC TGACAAGTTT GAAACCGTTA CATCAGGCAC 

|f] 801 AAATGTAACC TTTGCTAGTG GTAAAGGTAC AACTGCGACT GTAAGTAAAG 

O 851 ATGATCAAGG CAACATCACT GTTATGTATG ATGTAAATGT CGGCGATGCC 

12 901 CTAAACGTCA ATCAGCTGCA AAACAGCGGT T GGAATTTGG ATTCCAAAGC 

" " 951 GGTTGCAGGT TCTTCGGGCA AAGTCATCAG CGGCAATGTT TCGCCGAGCA 

10 01 AGGGAAAGAT GGATGAAACC GTCAACATTA ATGCCGGCAA CAACATCGAG 

1051 ATTACCCGCA ACGGTAAAAA TATCGACATC GCCACTTCGA TGACCCCGCA 

1101 GTTTTCCAGC GTTTCGCTCG GCGCGGGGGC GGATGCGCCC ACTTTGAGCG 

1151 TGGATGGGGA CGCATTGAAT GTCGGCAGCA AGAAGGACAA CAAACCCGTC 

1201 CGCATTACCA ATGTCGCCCC GGGCGTTAAA GAGGGGGATG TTACAAACGT 

1251 CGCACAACTT AAAGGCGTGG CGCAAAACTT GAACAACCGC ATCGACAATG 

1301 TGGACGGCAA CGCGCGTGCG GGCATCGCCC AAGCGATTGC AACCGCAGGT 

1351 CTGGTTCAGG CGTATTTGCC CGGCAAGAGT ATGATGGCGA TCGGCGGCGG 

14 01 CACTTATCGC GGCGAAGCCG GTTACGCCAT CGGCTACTCC AGTATTTCCG 

1451 ACGGCGGAAA TTGGATTATC AAAGGCACGG CTT CCGGCAA TTCGCGCGGC 

1S01 CATTTCGGTG CTTCCGCATC TGTCGGTTAT CAGTGGTAA 
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1 MNKIYRXIWN SALNAWVAVS ELTRNHTKRA SATVKTAVIA TLLFATVQAN 

SI ATDETGLINV ETEKLSFGAN GKKVNIISDT KGLNFAKETA GTNGDTTVHL 

101 NGIGSTLTDM LLNTGATTNV TNDNVTDDEK KRAASVKDVL NAGWN I KG VK 

151 PGTTASDNVD FVRTYDTVEF tSADTKTTTV NVESKDNGKK ZJS 

201 VIKEKDGKLV TGKGKGENGS STDEGEGLVT AKEVIDAVNK AGwSS^S 

251 NGQTGQADKF ETVTSGTKVT FASGNGTTAT VSKDDQGNIT VKYDVNVGDA 

301 LNVNQLQNSG WNLDSKAVAG SSGKVISGNV SPSKGKMDET WINAG^E 

351 ITRNGKN1DI ATSMTPQFSS VSLGAGADAP TLSVDDEGAL MVGSKDAnJp 

401 VRITNVAPGV KEGDVTNVAQ LKGVAQNLNN RI DNVNGNAR aS^S 

soi SEEK 55""" MB "" M " ssrSA ' GNWI xk^Sg^r 



i 

51 



ATGAACAAAA TAT AC C G CAT CATTTGGAAT AGTGCCCTCA ATGCCT GGGT 
CGCCGTATCC GAGCTCACAC GCAACCACAC CAAACGCGCC TCCGCAACCG 

101 TGAAGACCGC CGTATTGGCG ACACTGTTGT TTGCAACGGT TCAGGCGAAT 

151 GCTACCGATG AAACAGGCCT GATCAATGTT GAAACTGAAA AATTATCGTT 

201 TGGCGCAAAC GGCAAGAAAG T CAAC AT CAT AAGCGACACC AAAGGCTTGA 

25 1 ATTTCGCGAA AGAAACGGCT GGGACGAACG GCGACACCAC GGTTCATCTG 

301 AACGGTATCG GTTCGACTTT GACCGATATG CTGCTGAATA CCGGAGCGAC 

351 CACAAACGTA ACCAACGACA ACGTTACCGA TGACGAGAAA AAACGTGCGG 

401 CAAGCGTTAA AGACGTATTA AACGCAGGCT GGAACATTAA AGGCGTTAAA 

451 CCCGGTACAA CAGCTTCCGA TAACGTTGAT TTCGTCCGQA CTTACGACAC 

501 AGTCGAGTTC TTGAGCGCAG ATACGAAAAC AACGACTGTT AATGTGGAAA 

551 GCAAAGACAA CGGCAAGAAA ACCGAAGTTA AAATCGGTGC GAAGACTTCT 

601 GTTAT taaag AAAAAGACGG TAAGTTGGTT actggtaaag gcaaaggcga 

651 gaatggttct tctacagacg aaggcgaagg cttagtgact gcaaaagaag 

701 tgattgatgc agtaaacaag gctggttgga gaatgaaaac aacaaccgct 

751 AATGGTCAAA CAGGTCAAGC TGACAAGTTT GAAACCGTTA CATCAGGCAC 

801 AAAAGTAACC TTTGCTAGTG GTAATGGTAC AACTGCGACT GTAAGTAAAG 

851 ATGATCAAGG CAACATCACT GTTAAGTATG ATGTAAATGT CGGCGATGCC 

901 CTAAACGTCA ATCAGCTGCA AAAC AG CGGT TGGAATTTGG ATTCCAAAGC 

951 GGTTGCAGGT TCTTCGGGCA AAGT CATCAG CGGCAATGTT TCGCCGAGCA 

1001 AGGGAAAGAT GGAT GAAACC GTCAACATTA ATGCCGGCAA CAACATCGAG 

1051 ATTACCCGCA ACGGCAAAAA T AT CGACATC GCCACTTCGA TGACCCCGCA 

1101 ATTTTCCAGC GTTTCGCTCG GCGCGGGGGC GGATGCGCCC ACTTTAAGCG 

1151 TGGATGACGA GGGCGCGTTG AATGTCGGCA GCAAGGATGC CAACAAACCC 

1201 GTCCGCATTA CCAATGTCGC CCCGGGCGTT AAAGAGGGGG ATGTTACAAA 

1251 CGTCGCGCAA CTTAAAGGTG TGGCGCAAAA CTTGAACAAC CGCAT CGACA 

1301 ATGTGAACGG CAACGCGCGT GCGGGCATCG CCCAAGCGAT TGCAACCGCA 

1351 GGTCTGGTTC AGGCGTATCT GCCCGGCAAG AGTATGATGG CGATCGGCGG 

14 01 CGGCACTTAT CTCGGCGAAG CCGGTTATGC CATCGGCTAC TCAAGCATTT 

1451 CCGCCGGCGG AAATTGGATT ATCAAAG GCA CGGCTTCCGG CAATTCGCGC 

1501 GGCCATTT CG GTGCTTCCGC ATCTGTCGGT TAT CAGTGGT AA 
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1 MNKIYRIIWN SALNAWVWS ELTRNHTKRA SATVKTAVLA TLLFATVOA* 

SK25 ESS SHE sssss SS 

.. SSS52 SSSS 2S5SK S 

jSSS^" GOTRSEA « EWIIKS ^ £££££ 



351 

401 ASVGYQW 



ATGAACAAAA TATACCGCAT CATTTGGAAT ar,Trrrr«nr, 
CGTCGTATCC GAGCTCACAC JSSSS iSSSS 

TGAAGACCGC CGTATTGGCG ACTCTGTTGT S£SSS JSS£SS 
SSIJSS 06 TTGATTTCST CCGCACTTAC GACACAGTCG 
CGCAGATACG AAAACAACGA CTGTTAATGT GGAAAGCAAA GAGAA^rSf 

agaaaaccga agttaaaatc ggtgcgaaga cttctg™ ?JSSSaS 

GACGGTAAGT TGGTTACTGG TAAAGACAAA c£255S 

AGACGAAGGC gaaggcttag tgactgcaaa agaagtgat? SSSa^JS 

ACAAGGCTGG TTGGAGAATG AAAACAACAA CCGCTAATGG raSiSi^ 
SJSSS 0 " AGTTTGAAAC CGTTACATCA SgSSESS 5£?£SE 
^SJSSS? C GACTGTAAG T AAAGAT GAT 5E£3S£ 
T CACTGTTAT GTATGATGTA AATGTCGGCG ATGCCCTAAA CGTC-a&tv^TP 
CTGCAAAACA GCGGTTGGAA TTTGGATTCC AAAGCGGTTG 
GGGCAAAGTC ATCAGCGGCA ATGTTTCGCC GAGCAAGGGA AaSgSJJ 
AAACCGTCAA CATTAATGCC GGCAACAACA TCgSJtSS 
AAAAATATCG ACATCGCCAC TTCGATGACC CCGCAGTTTT cSSg'SJ^^ 

SSSSS SSSSSS -gStgS? sssss 

oX, rGAATGTCGG CAGCAAGAAG GACAACAAAC CCGTCCGCAT TACCAATrTr 

SJ SSSSSSS SSST* ggatgttaca aacgtcS 

951 CGTGGCGCAA AACTTGAACA ACCGCATCGA CAATGTGGAC GGCAACGCCr 

JS!? ^ GCGGGCAT C<5CCCAAGCG ATTGCAACCG CAGGTCTGGT 

1051 TTGCCCGGCA AG AGT AT GAT GGCGATCGGC GGCGGCACTT ATCGCgSSS 

J Jl ^ GGTTAC GCCATCGGCT ACTCCAGTAT TTCCgSSJ 

fSJ *™ TCAAAGG cacggcttcc ggcaattcgc gcggccattt cggtg?t?S 
1201 gcatctgtcg gttatcagtg gtaa ^ggtgcttcc 
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1 MNKIYRIIWN SALNAWVWS ELTRNHTKRA SATVKTAVLA TX/LFATVQAS 

51 ANRAASVKDV LNAGWNIKGV KPGTTASDNV DFVRTYDTVE FLSAOTKTTT 

101 VNVESKDNGK KTEVKIGAKT SVIKEKDGKL VTGKDKGEMG SSTDEGEGLV 

151 TAKE VI DAVN KAGWRMKTTT ANGQTGQADK FETVTSGTNV TFASGKGTTA 

201 TVSKDDQGNX. TVMYDVNVGD ALNVNQLQNS GWNLDSKAVA GSSGKVISGN 

251 VSPSKGKMDE TVNINAGNNI EITRNGKNID IATSMTPQFS SVSLGAGADA 

301 PTLSVDGDAL NVGSKKUNKP VRITNVAPGV KEGDVTNVAQ LKGVAQNLNU- 

351 RIDNVDGNAR AGIAQAIATA GLVQAYLPGK SMMAIGGGTY RGEAGYAIGY 

401 SSISDGGNWI IKGTASGNSR GHFGASASVG YQW* 



1 ATGAACAAAA TATACCGCAT CATTTGGAAT AGTGCCCTCA ATGCATGGGT 

51 CGTCGTATCC GAGCTCACAC GCAACCACAC CAAACGCGCC TCCGCAACCG 

101 TGAAGACCGC CGTATTGGCG ACTCTGTTGT TTGCAACGGT TCAGGCAAGT 

151 GCTAACCGTG CGGCAAGCGT TAAAGACGTA TTAAACGCTG GCTGGAACAT 

201 TAAAGGCGTT AAACCCGGTA CAACAGCTTC C G ATAACGTT GATTTCGTCC 

251 GCACTTACGA CACAGTCGAG TTCTTGAGCG CAGATACGAA AACAACGACT 

301 GTTAAT GT GG AAAGCAAAGA CAACGGCAAG AAAACCGAAG TTAAAATCGG 

351 TGCGAAGACT TCTGTTATTA AAGAAAAAGA CGGTAAGTTG GTTACTGGTA 

401 AAGACAAAGG CGAGAATGGT TCTTCTACAG ACGAAGGCGA AGGCTTAGTG 

451 ACT GCAAAAG AAGTGATTGA TGCAGTAAAC AAGGCTGGTT GGAGAATGAA 

501 AACAACAACC GCTAATGGTC AAACAGGTCA AGCTGACAAG TTTGAAACCG 

551 TTACATCAGG CACAAATGTA ACCTTTGCTA GTGGTAAAGG TACAACTGCG 

601 ACTGTAAGTA AAGATGATCA AGGCAACATC ACTGTTATGT ATGATGTAAA 

6S1 TGTCGGCGAT GCCCTAAACG TCAATCAGCT GCAAAACAGC GGTTGGAATT 

701 TGGATTCCAA AGCGGTTGCA GGTTCTTCGG GCAAAGT CAT CAGCGGCAAT 

751 GTTTCGCCGA GCAAGGGAAA GATGGAT GAA ACCGTCAACA TTAATGCCGG 

801 CAACAACATC GAGATTACCC GCAACGGTAA AAATATCGAC ATCGCCACTT 

851 CGATGACCCC GCAGTTTTCC AGCGTTTCGC TCGGCGCGGG GGCGGATGCG 

901 CCCACTTTGA GCGTGGATGG GGACGCATTG AATGTCGGCA G CAAGAAGG A 

951 CAACAAACCC GTCCGCATTA CCAATGTCGC CCCGGGCGTT AAAGAGGGGG 

1001 AT GTT AC AAA CGTCGCACAA CTTAAAGGCG TGGCGCAAAA CTTGAACAAC 

1051 CGCAT CGACA ATGTGGACGG CAACGCGCGT GCGGGCATCG CCCAAGCGAT 

1101 TGCAACCGCA GGTCTGGTTC AGGCGTATTT GCCCGGCAAG AGTATGATGG 

1151 CGATCGGCGG CGGCACTTAT CGCGGCGAAG CCGGTTACGC CATCGGCTAC 

1201 TCCAGTATTT CCGACGGCGG AAATTGGATT ATCAAAGGCA CGGCTTCCGG 

1251 CAATTCGCGC GGCCATTTCG GTGCTTCCGC ATCTGTCGGT TATCAGTGGT 

1301 AA 
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1 MNKIYRIIWN SALNAWVWS ELTRNHTKRA SATVKTAVLA TLLFatvoa<? 

31 ANTLKAGDNL KIKQFTYSLK KDLTDLTSVG TBttSSES S^StoS? 

J?J ^^ KETAG ™«»™* GXGSTLTDRA ASVKDVLNAG wSJS 

151 FVRTYDTVEF LSADTKTTTV NVESKDNGKK TEVKIGAKTS VIKEfCDGKLV 

201 TGKDKGENGS STDEGEGLVT AK EVI DAVNK AGWI^KTTTA ISStSSm 

251 ETVTSGTNVT FAS GKGTTAT VSKDDQGNIT VMYDVNVG DA LNwSoSJg' 

III- ESSES? 5 SSG ^"GNV SPSKGKMDET VHIW^» JXSSwS? 

!S ^^ PQFSS v ^ lgagadap tlsvdgdaln vgskkdnkpv ritnvapgvk 

401 egdvtnvaql kgvaqnlnnr idnvdgnara giaqaiatag lvqaSpSs 

501 ^ IGGGTYR S1SDGGNW1I KGTASGNSRG SgSSSS 



1 ATGAACAAAA tataccgcat catttggaat agtgccctca atgcatgggt 

51 CGTCGTATCC GAGCTCACAC GCAACCACAC CAAACGCGCC TCCGCAACCG 
101 TGAAGACCGC CGTATTGGCG ACTCTGTTGT TTGCAACGGT TCAGGCAAGT 
1S1 GCTAACACCC TCAAAGCCGG CGACAACCTG AAAATCAAAC AATTCACCTA 
201 CTCGCTGAAA AAAGACCTCA CAGATCTGAC CAGTGTTGGA ACTGAAAAAT 
251 TATCGTTTAG CGCAAACGGC AATAAAGTCA ACATCACAAG CGACACCAAA 
301 GGCTTGAATT TTGCGAAAGA AACGGCTGGG ACGAACGGCG ACACCACGGT 
351 TCATCTGAAC GGTATTGGTT CGACTTTGAC CGATCGTGCG GCAAGCGTTA 
401 AAGACGTATT AAACGCTGGC TGGAACATTA AAGGCGTTAA AAACGTTGAT 
451 TTCGTCCGCA CTTACGACAC AGTC GAGTTC TTGAGCGCAG ATACGAAAAC 
501 AACGACTGTT AATGTGGAAA GCAAAGACAA CGGCAAGAAA ACCGAAGTTA 
551 AAATCGGTGC GAAGACTTCT GTTATTAAAG AAAAAGACGG TAAGTTGGTT 
601 ACTGGTAAAG ACAAAGGCGA GAATGGTTCT TCTACAGACG AAGGCGAAGG 
651 CTTAGTGACT GCAAAAGAAG TGATTGATGC AGTAAACAAG GCTGGTTGGA 
701 GAATGAAAAC AACAACC6CT AATGGTCAAA CAGGTCAAGC TGACAAGTTT 
751 GAAACCGTTA CAT CAGGCAC AAATGTAACC TTTGCTAGTG GTAAAG6TAC 
801 AACT GCGACT GTAAGTAAAG ATGATCAAGG CAACATCACT GTTATGTATG 
851 ATGTAAATGT CGGCGATGCC CTAAACGTCA ATCAGCTGCA AAACAGCGGT 
901 TGGAATTTGG ATTCCAAAGC GGTTGCAGGT TCTTCGGGCA AAGTCATCAG 
951 CGGCAATGTT TCGCCGAGCA AG GGAAAGAT GGATGAAACC GTCAACATTA 
1001 ATGCCGGCAA CAACATCGAG ATTACCCGCA ACGGTAAAAA TATC GACATC 
1051 GCCACTTCGA TGACCCCGCA GTTTTCCAGC GTTTCGCTCG GCGCGGGGGC 
1101 GGATGCGCCC ACTTTGAGCG TGGATGGGGA CGCATTGAAT GTCGGCAGCA 
1151 AGAAGGACAA CAAACCCGTC CGCATTACCA ATGTCGCCCC GGGCGTTAAA 
1201 GAGGGGGATG TTACAAACGT CGCACAACTT AAAGGCGTGG CGCAAAACTT 
1251 GAACAACCGC ATCGACAATG TGGACGGCAA CGCGCGTGCG GGCATCGCCC 
1301 AAGCGATTGC AACCGCAGGT CTGGTTCAGG CGTATTTGCC CGGCAAGAGT 
1351 ATGATGGCGA TCGGCGGCGG CACTTATCGC GGCGAAGCCG GTTACGCCAT 
1401 CGGCTACTCC AGTATTTCCG ACGGCGGAAA TTGGATTATC AAAGGCACGG 
14 51 CTTCCGGCAA TTCGCGCGGC CATTTCGGTG CTTCCGCATC TGTCGGTTAT 
1501 CAGTGGTAA 
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1 5 

«41 WKiy^ITWN gflLNAWVAVS ET.TRNHTKRA SATVKTAVT. A TLX FAT VQA w 
PMC2 ^ MttKIYK^IW* SALNAWVWS OLTRNHTKRA SA.TVNTAVT A TT T.r*^rXgg 
p£™ U f:\ S""""« 3AL NAWVAVS ELTRNHTKKA SAT V ^AVLA ruSSSS 
^SiS? del MNKIYRIIWJC SALNAWWVS ELTRNHTKRA SATVKTAVLA TI^FATvSS 
FMC21C1C5 jMNKIVRIIWK SALNAWVWS ELTRNHTKRA SATVKTAVLA T LL FAT VQAS 

CI 

51 100 
H41 ATDED..EE £ ELESVQRS.V VGSIQA5MEG SVELET ... I SLSM TMmct. 
mCZ1 ANNEEQ5EYL- YLH PVQRTVA VLIVnSDKEG AGEKEKVEEN SDWAVYF NEK 

H41Studel ATOE I " 7T! — " 

PMC2lBgldel ANNE \ 

PMC21C1C5 AN \\\\ ,WWWWWWW. 

VI 

10X 150 
H41 FVDPVIWTL KAGDNLKI Ko N.TNENTNAS SF TYSLK KPL TGLlNVETFt y 
PMC21 GVLTAREITL K AGDNL K I Kfjl NGTN FTYSLKKDT. TPLt^VGtW 

FMC21C1C5 

VI C2 V2 C3 " 

151 200 
H41 I» S FG ANG KKV NIISPTKGLN FAKETAGT NG DTTVHLNrGIG STTiTDMf.T.M T 
L5FSAHGNKV NITSDTqp LN FAKETAGTNG DTTVHLNGIG STLTnTT.T.MT 
H41Studel LS FGANGKKV NIISDTKGLN FAKETAGTNG DTTVHLNGIG STLTOMLLNT 
PMC21Bgldel LSFSANGNKV NXTSDTKGLN FAKETAGTNG DTTVHLNGIG STLTDTLLNT 
PMC21C1C5 

C3 V3 " 

201 250 
H41 GATTNVTNQN VTDDEKKRAA SVKDVLNAGW N I KGVKFGTT ASDNVDFVRT 
PMC 21 OATTNVTNDN VTDDEKKRAA SVKDVLNAGW KIKGVKPGTT AS DNVQFVRT 
HdlStudel GATTNVTNDN VTDDEKKRAA SVKDVLNAGW NIKGVKFGTT ASDNVDFVRT 
PMC21Bgldel GATTNVTND?? VTDDEKKRAA SVKDVLNAGW NIKGVKPGTT ASDNVDFVRT 

FMC21C1C5 NVDPVRT 

V3 C4 V4 C5 

251 300 

H41 YDTVE5-LSA 3 TKTTTVNVES KDNGKKTEVK IGAKTSVIKE KDGKLVTGKG 

PMC21 YDTVEFLSAD TKTTTVN VES KDNGKKTEVK IGAKTSVIKE KDGKLVTGKD 

H41Studel YDTVEETLSAD TKTTTVNVES KDNGKKTEVK IGAKTSVIKE KDGKLVTGKG 

PMC21Bgldel YDTVEFLSAD TKTTTVNVES KDNGKKTEVK IGAKTSVIKE KOGKLVTGKD 

PMC21C1C5 YDTVE FLS&2 TKTTTVNVES KDNGKKTEVK IGAKTSVIKE KDGKLVTGKD 

CS 



H41 
PMC21 
H41Studel 
PMC2lsgld<sl 
PMC21C1C5 



301 350 
KGENGSSTEE GEGLVTA KEV IDAVNKAGWR MKTTTANGOT GOADKFFTVT 
KGENGSSTDH; GEGLVTAKEV flpAVNKAGWR MKTTTANGQT GQADKFETVT 
KGENGSSTDE GEGLVTAKEV IDAVNKAGWR MKTTTANGQT GQADKFETVT 
KGENGSSTDS GEGLVTAKEV IDAVNKAGWR MKTTTANGQT GQADKFETVT 
KGENGSSTDE GEGLVTAKEV IDAVNKAGWR MKTTTANGQT GQADKFETVT 

C5 



351 400 
S^TKVTFASG NGTTATVSKD DOGNIT VKVD VNVGDALNVN OLONSfiWNTT.n 
SGTNVTFAS^ ftG TTATVSKD DOGNITVMYD VNVGDALNVp OLONSGHNLO 
5GTKVTFASS NGTTATVSKD DQGNITVKYD VNVGDALNVN QLQNSGWNLD 
PMC21Bgld«l SGTNVTFAS^ KGTTATVSKD DQGNITVMYD VNVGDALNVN QLQNSGWNLD 
PMC21C1C5 SGTNVTFASS KGTTATVSKD DQGNITVMYD VNVGDALNVN QLQNSGWNLD 

C5 



H41 
PMC21 
H41Studel 
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401 450 
H41 S jfrVAGSSGK VTgWffpSK QKMPETVNIN AGNNIEITRM ip nirpT^c 
SKAVAGSSGK VISGNVSPSK CKMPEttVNTN AGNNIEIT^T fWpiAT ^ 
p^?» U ?h\ f^VAGSSGK VISGWSPSK GKMDETVNlS AGNNJEITRN GKNIDIATSM 
PMC2XBgldel SKAVAGSSGK VISGNVSPSK GKMDETVNIN AGNNIEITRN GKNIDIATSM 
PMC21C1C5 SKAVA05SGK VISGNVSPSK GKMDETVNIN AGNNIEITRN GKNIDIATSM 

C5 

451 500 
H41 TtOFSSVSLG AGADAPTLSV ODEGALNVfiK TC^ KBVKX T NVAPSVKEG p 
PMC21 TPOFS5VSLG AGADAPTLSV rv ^QALNVGS KKnWPVRTT KvapSv^ 
H41StUd*l TPQFSSVSLG AGADAPTLSV DDEGALNVGS ECDANKPVftIT NVAPGVKEGd 
PMC2lBgldel TPQFSSVSLG AGADAPTLSV DG . DALNVGS KKDNKPVRIT NVAPGVKEGD 
PMC21C1C5 TPQFSSVSLG AGADAPTLSV DG. DALNVGS KK0NKPVRIT NVAPGVKEGD 

C5 

501 550 
H41 VTNVAOLKGV AQNLNNRIDN VNGNARAGlA OAIATAgT. VQ AYLPGKSMMA 
PMC21 VTNVAOLKGV AONLNNR^pN VDGNARAGIA QATATAGLVO AYLPGKSMMA 
H4iStudel VTNVAQLKGV AQNLNNRIDN VNGNARAG I A QAIATAGLVQ AYLPGKSMMA 
PMC2lBgldel VTNVAQLKGV AQNLNNRIDN VDGNARAGIA QAIATAGLVQ AYLPGKSMMA 
PMC21C1C5 VTNVAQLKGV AQNLNNRIDN VDGNARAGIA QAIATAGLVQ AYLPGKSMMA 

C5 



H41 
PMC21 
H4lStudel 
PMC21Bgldel 
PMC21CIC5 



551 600 
IGGGTYLGSA GYAIGYSSIS AGGNW T I KGT ASGNSR GJiFG ASASVGYQK . 
IGGGTYRGEA GYAIGYSSIS DGGNWT TFCGT ASGNSR GH FG ASASVQYQ W. 
IGGGTYLGEA GYAIGYSSIS AGGNWIIKGT ASGNSRGH FG ASASVGYQW. 
IGGGTYRGEA GYAIGYSSIS DGGNWIIKGT AS6NSRGHFG ASA$VGYQW. 
IGGGTYRGEA GYAIGYSSIS DGGNWIIKGT ASGNSRGH FG ASASVGYQW. 

C5 
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52 




YLHPVQRTVA VLIVNSDKEG 


AGEKEKVEEN 


SDWAVYFNEK 


101 

A. V J- 


GVLTARF ttt. 
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NKVNX 1 o DTK 
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LNTGATTNVT 


201 
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251 


SADTKTTTVN 
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IKEKDGKLVT 


GKDKGENGSS 


301 


TDEGEGLVTA 


KEVIDAVNKA GWRMKTTTAN 


GQTGQADKFE 


TVTSGTNVTF 


351 


ASGKGTTATV 


SKDDQGNITV MYDVNVGDAL 


NVNQLQNSGW 


NLDSKAVAGS 


401 


SGKVISGNVS 


PSKGKMDETV NINAGNNIEI 


TRNGKNIDIA 


TSMTPQFSSV 


451 


SLGAGADAPT 


LSVDGDALNV GSKKDNKPVR 


ITNVAPGVKE 


GDVTNVAQLK 


501 


GVAQNLNNRI 


DNVDGNARAG IAQAIATAGL 


VQAYLPGKSM 


MAIGGGTYRG 


551 


EAGYAIGYSS 


ISDGGNWIIK GTASGNSRGH 


FGASASVGYQ 


W* 



B 



52 


TDEDEEEEL 


ESVQRSWGS 


IQASMEGSVE 


LETISLSMTN 


DSKEFVDPYI 


101 


WTLKAGDNL 


KIKQNTNENT 


NASSFTYSLK 


KDLTGLINVE 


TEKLSFGANG 


151 


KKVNIISDTK 


GLNFAKETAG 


TNGDTTVHLN 


GIGSTLTDML 


LNTGATTNVT 


201 


NDNVTDDEKK 


RAASVKDVLN 


AGWNIKGVKP 


GTTASDNVDF 


VRTYDTVEFL 


251 


SADTKTTTVN 


VESKDNGKKT 


EVKIGAKTSV 


IKEKDGKLVT 


GKGKGENGSS 


301 


TDEGEGLVTA 


KEVIDAVNKA 


GWRMKTTTAN 


GQTGQADKFE 


TVTSGTKVTF 


351 


ASGNGTTATV 


SKDDQGNITV 


KYDVNVGDAL 


NVNQLQNSGW 


NLDSKAVAGS 


401 


SGKVISGNVS 


PSKGKMDETV 


NINAGNNIEI 


TRNGKNIDIA 


TSMTPQFSSV 


451 


SLGAGADAPT 


LSVDDEGALN 


VGSKDANKPV 


RITNVAPGVK 


EGDVTNVAQL 


501 


KGVAQNLNNR 


IDNVNGNARA 


GIAQAIATAG 


LVQAYLPGKS 


MMAIGGGTYL 


551 


GEAGYAIGYS 


SISAGGNWII 


KGTASGNSRG 


HFGASASVGY 


QW* 
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52 NNETDLTSV GTEKLSFSAN GNKVNITSDT KGLN FAKE T A GTNGDTTVHL 

101 NGIGSTLTDT LLNTGATTNV TNDNVTDDEK KRAASVKDVL NAGWNIKGVK 

151 PGTTASDNVD FVRTYDTVEF LSADTKTTTV NVESKDNGKK TEVKlGAKTS 

201 VIKEKDGKLV TGKDKGENGS STDEGEGLVT AKEVIDAVNK AGWRMKTTTA 

251 NGQTGQADKF ETVTSGTNVT FASGKGTTAT VSKDDQGNIT VMYDVNVGDA 

301 LNVNQLQNSG WNL DSKAVAG SSGKVISGNV SPSKGKMDET VNINAGNNIE 

351 ITRNGKNIDI ATSMTPQFSS VSLGAGADAP TLSVDGDALN VGSKKDNKFV 

401 RITNVAPGVK EGDVTNVAQL KGVAQNLNNR I DNVDGNARA GIAQAIATAG 

451 LVQAYLPGKS MMAIGGGTYR GEAGYAIGYS SISDGGNWII KGTASGNSRG 

501 HFGASASVGY QW* 



52 


TDETGLINV 


ETEKLSFGAN 


GKKVNIISDT 


KGLNFAKETA 


GTNGDTTVHL 


101 


NGIGSTLTDM 


LLNTGATTNV 


TNDNVTDDEK 


KRAASVKDVL 


NAGWNIKGVK 


151 


PGTTASDNVD 


FVRTYDTVEF 


LSADTKTTTV 


NVESKDNGKK 


TEVKlGAKTS 


201 


VIKEKDGKLV 


TGKGKGENGS 


STDEGEGLVT 


AKEVIDAVNK 


AGWRMKTTTA 


251 


NGQTGQADKF 


ETVTSGTKVT 


FASGNGTTAT 


VSKDDQGNIT 


VKYDVNVGDA 


301 


LNVNQLQNSG 


WNLDSKAVAG 


SSGKVISGNV 


SPSKGKMDET 


VNINAGNNIE 


351 


ITRNGKNIDI 


ATSMTPQFSS 


VSLGAGADAP 


TLSVDDEGAL 


NVGSKDANKP 


401 


VRITNVAPGV 


KEGDVTNVAQ LKGVAQNLNN 


RIDNVNGNAR AGIAQAIATA 


451 


GLVQAYLPGK 


SMMAIGGGTY 


LGEAGYAIGY 


SSISAGGNWI 


IKGTASGNSR 


501 


GHFGASASVG 


YQW* 
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52 


NNVDFVRTY 


DTVEFLSADT 


KTTTVNVESK 


DNGKKTEVKI 


GAKTSVIKEK 


101 


DGKLVTGKDK 


GENGSSTDEG 


EGLVTAKEVT 




rv J. J. J,jr\lNoy J.la 


151 


QADKFETVTS 


GTNVTFASGK 


GTTATVSKDD 


QGNITVMYDV 


NVGDALNVNQ 


201 


LQNSGWNLDS 


KAVAGSSGKV 


ISGNVSPSKG 


KMDETVNINA 


GNNIEITRNG 


251 


KNIDIATSMT 


PQFSSVSLGA 


GADAPTLSVD 


GDALNVGSKK 


DNKPVRITNV 


301 


APGVKEGDVT 


NVAQLKGVAQ 


NLNNRIDNVD 


GNARAGIAQA 


IATAGLVQAY 


351 


LPGKSMMAIG 


GGTYRGEAGY 


AIGYSSISDG 


GNWIIKGTAS 


GNSRGHFGAS 


401 


ASVGYQW* 











52 


NRAASVKDV 


LNAGWNIKGV 


KPGTTASDNV 


DFVRTYDTVE 


FLSADTKTTT 


101 


VNVESKDNGK 


KTEVKIGAKT 


SVIKEKDGKL 


VTGKDKGENG 


SSTDEGEGLV 


151 


TAKE VI DAVN 


KAGWRMKTTT 


ANGQTGQADK 


FETVTSGTNV 


TFASGKGTTA 


201 


TVSKDDQGNI 


TVMYDVNVGD 


ALNVNQLQNS 


GWNLDSKAVA 


GSSGKVISGN 


251 


VSPSKGKMDE 


TVNINAGNNI 


EITRNGKNID 


IATSMTPQFS 


SVSLGAGADA 


301 


PTLSVDGDAL 


NVGSKKDNKP 


VRITNVAPGV 


KEGDVTNVAQ 


LKGVAQNLNN 


351 


RIDNVDGNAR 


AGIAQAIATA 


GLVQAYLPGK 


SMMAIGGGTY 


RGEAGYAIGY 


401 


SSISDGGNWI 


IKGTASGNSR 


GHFGASASVG 


YQW* 





50 SANTLKAGDNL KIKQFTYSLK KDLTDLTSVG TEKLSFSANG NKVNITSDTK 

101 GLNFAKETAG TNGDTTVHLN GIGSTLT DRA ASVKDVLNAG WNIKGVKNVD 

151 FVRTYDTVEF LSADTKTTTV NVESKDNGKK TEVKIGAKTS VXKEKDGKLV 

201 TGKDKGENGS STDEGEGLVT AKE VI DAVNK AGWRMKTTTA NGQTGQADKF 

251 ETVTSGTNVT FASGKGTTAT VSKDDQGNIT VMYDVNVGDA LNVNQLQNSG 

301 WNLDSKAVAG SSGKVISGNV SPSKGKMDET VNINAGNNIE ITRNGKNIDI 

351 ATSMTPQFSS VSLGAGADAP TLSVDGDALN VGSKKDNKPV RITNVAPGVK 

401 EGDVXNVAQL KGVAQNLNNR IDNVDGNARA GIAQAIATAG LVQAYLPGKS 

451 MMAIGGGTYR GEAGYAIGYS SISDGGNWII KGTAS GttS RG HFGASASVGY 

501 QW* 
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